Decision tree using default settings
set.seed(20)
fit <- rpart(deg_malig~age+breast+breast_quad+inv_nodes+irradiat+menopause+node_caps+tumor_size,
method="class", data=breast_cancer,
control=rpart.control(),
parms=list(split='information'))
summary(fit)
## Call:
## rpart(formula = deg_malig ~ age + breast + breast_quad + inv_nodes +
## irradiat + menopause + node_caps + tumor_size, data = breast_cancer,
## method = "class", parms = list(split = "information"), control = rpart.control())
## n= 277
##
## CP nsplit rel error xerror xstd
## 1 0.04391892 0 1.0000000 1.000000 0.05609499
## 2 0.02027027 2 0.9121622 1.020270 0.05599795
## 3 0.01351351 3 0.8918919 1.114865 0.05518860
## 4 0.01126126 10 0.7905405 1.168919 0.05445505
## 5 0.01000000 13 0.7567568 1.148649 0.05475386
##
## Variable importance
## inv_nodes tumor_size node_caps age menopause breast_quad
## 26 23 15 12 9 9
## breast irradiat
## 5 2
##
## Node number 1: 277 observations, complexity param=0.04391892
## predicted class=2 expected loss=0.534296 P(node) =1
## class counts: 66 129 82
## probabilities: 0.238 0.466 0.296
## left son=2 (209 obs) right son=3 (68 obs)
## Primary splits:
## inv_nodes splits as LRRRRRR, improve=20.974280, (0 missing)
## node_caps splits as LR, improve=20.760610, (0 missing)
## tumor_size splits as LLRRRRRRRLR, improve= 9.751465, (0 missing)
## irradiat splits as LR, improve= 9.098196, (0 missing)
## menopause splits as RRL, improve= 2.881789, (0 missing)
## Surrogate splits:
## node_caps splits as LR, agree=0.892, adj=0.559, (0 split)
## irradiat splits as LR, agree=0.769, adj=0.059, (0 split)
##
## Node number 2: 209 observations, complexity param=0.01351351
## predicted class=2 expected loss=0.5358852 P(node) =0.7545126
## class counts: 65 97 47
## probabilities: 0.311 0.464 0.225
## left son=4 (73 obs) right son=5 (136 obs)
## Primary splits:
## tumor_size splits as LLLRRRRRLLL, improve=7.481480, (0 missing)
## node_caps splits as LR, improve=3.733983, (0 missing)
## breast_quad splits as LLRLR, improve=3.080368, (0 missing)
## irradiat splits as LR, improve=3.035000, (0 missing)
## menopause splits as RRL, improve=1.196347, (0 missing)
## Surrogate splits:
## breast_quad splits as LRRRR, agree=0.660, adj=0.027, (0 split)
## menopause splits as RLR, agree=0.656, adj=0.014, (0 split)
##
## Node number 3: 68 observations, complexity param=0.04391892
## predicted class=3 expected loss=0.4852941 P(node) =0.2454874
## class counts: 1 32 35
## probabilities: 0.015 0.471 0.515
## left son=6 (36 obs) right son=7 (32 obs)
## Primary splits:
## tumor_size splits as -RRLRLRRR-L, improve=4.914226, (0 missing)
## inv_nodes splits as -RRRLLL, improve=3.993382, (0 missing)
## menopause splits as R-L, improve=2.885781, (0 missing)
## breast splits as RL, improve=2.874078, (0 missing)
## breast_quad splits as LRLRL, improve=2.874078, (0 missing)
## Surrogate splits:
## inv_nodes splits as -RRLLRR, agree=0.632, adj=0.219, (0 split)
## irradiat splits as LR, agree=0.603, adj=0.156, (0 split)
## age splits as -LLRR-, agree=0.559, adj=0.063, (0 split)
## node_caps splits as LR, agree=0.544, adj=0.031, (0 split)
##
## Node number 4: 73 observations, complexity param=0.01126126
## predicted class=2 expected loss=0.4657534 P(node) =0.2635379
## class counts: 28 39 6
## probabilities: 0.384 0.534 0.082
## left son=8 (42 obs) right son=9 (31 obs)
## Primary splits:
## breast_quad splits as RLRLL, improve=2.319334, (0 missing)
## tumor_size splits as RLR-----LLR, improve=2.233882, (0 missing)
## irradiat splits as LR, improve=1.246302, (0 missing)
## age splits as -LRLLL, improve=1.116546, (0 missing)
## menopause splits as LRR, improve=1.096317, (0 missing)
## Surrogate splits:
## breast splits as LR, agree=0.630, adj=0.129, (0 split)
## node_caps splits as LR, agree=0.616, adj=0.097, (0 split)
## tumor_size splits as RLL-----LLL, agree=0.603, adj=0.065, (0 split)
## age splits as -LLLRL, agree=0.589, adj=0.032, (0 split)
## irradiat splits as LR, agree=0.589, adj=0.032, (0 split)
##
## Node number 5: 136 observations, complexity param=0.01351351
## predicted class=2 expected loss=0.5735294 P(node) =0.4909747
## class counts: 37 58 41
## probabilities: 0.272 0.426 0.301
## left son=10 (87 obs) right son=11 (49 obs)
## Primary splits:
## tumor_size splits as ---LLRRL---, improve=2.4450710, (0 missing)
## irradiat splits as LR, improve=2.4340000, (0 missing)
## menopause splits as RRL, improve=1.5358650, (0 missing)
## breast_quad splits as RRRLR, improve=1.3153470, (0 missing)
## age splits as LRLRRR, improve=0.9967619, (0 missing)
## Surrogate splits:
## menopause splits as LRL, agree=0.654, adj=0.041, (0 split)
## node_caps splits as LR, agree=0.654, adj=0.041, (0 split)
## age splits as RLLLLL, agree=0.647, adj=0.020, (0 split)
## breast_quad splits as LLLLR, agree=0.647, adj=0.020, (0 split)
##
## Node number 6: 36 observations, complexity param=0.02027027
## predicted class=2 expected loss=0.3611111 P(node) =0.1299639
## class counts: 0 23 13
## probabilities: 0.000 0.639 0.361
## left son=12 (21 obs) right son=13 (15 obs)
## Primary splits:
## menopause splits as R-L, improve=3.2256310, (0 missing)
## tumor_size splits as ---L-R----L, improve=1.5076650, (0 missing)
## breast_quad splits as LRRRL, improve=1.0070870, (0 missing)
## breast splits as RL, improve=0.5455044, (0 missing)
## age splits as -LLRR-, improve=0.3636598, (0 missing)
## Surrogate splits:
## age splits as -LLRR-, agree=0.861, adj=0.667, (0 split)
## breast_quad splits as LLLRL, agree=0.667, adj=0.200, (0 split)
## breast splits as RL, agree=0.639, adj=0.133, (0 split)
## inv_nodes splits as -LLRLLL, agree=0.611, adj=0.067, (0 split)
##
## Node number 7: 32 observations
## predicted class=3 expected loss=0.3125 P(node) =0.1155235
## class counts: 1 9 22
## probabilities: 0.031 0.281 0.688
##
## Node number 8: 42 observations, complexity param=0.01126126
## predicted class=2 expected loss=0.4285714 P(node) =0.1516245
## class counts: 17 24 1
## probabilities: 0.405 0.571 0.024
## left son=16 (17 obs) right son=17 (25 obs)
## Primary splits:
## age splits as -LRRLL, improve=2.3409030, (0 missing)
## tumor_size splits as LLR-----LRR, improve=1.6696220, (0 missing)
## menopause splits as LLR, improve=0.7583689, (0 missing)
## breast_quad splits as -R-LL, improve=0.5940572, (0 missing)
## breast splits as LR, improve=0.5723340, (0 missing)
## Surrogate splits:
## menopause splits as LRR, agree=0.643, adj=0.118, (0 split)
## breast_quad splits as -R-LR, agree=0.619, adj=0.059, (0 split)
##
## Node number 9: 31 observations, complexity param=0.01126126
## predicted class=2 expected loss=0.516129 P(node) =0.1119134
## class counts: 11 15 5
## probabilities: 0.355 0.484 0.161
## left son=18 (12 obs) right son=19 (19 obs)
## Primary splits:
## tumor_size splits as RLR------LR, improve=3.9323710, (0 missing)
## age splits as -RRLRR, improve=2.3978190, (0 missing)
## menopause splits as LRR, improve=1.7459430, (0 missing)
## breast splits as LR, improve=0.3546232, (0 missing)
## breast_quad splits as L-R--, improve=0.2327571, (0 missing)
## Surrogate splits:
## age splits as -RLRRL, agree=0.677, adj=0.167, (0 split)
## breast splits as LR, agree=0.645, adj=0.083, (0 split)
##
## Node number 10: 87 observations, complexity param=0.01351351
## predicted class=2 expected loss=0.5057471 P(node) =0.3140794
## class counts: 22 43 22
## probabilities: 0.253 0.494 0.253
## left son=20 (50 obs) right son=21 (37 obs)
## Primary splits:
## menopause splits as R-L, improve=4.0142610, (0 missing)
## breast_quad splits as LLRLR, improve=2.5566890, (0 missing)
## irradiat splits as LR, improve=2.1960260, (0 missing)
## age splits as -LLLRR, improve=1.3840990, (0 missing)
## breast splits as RL, improve=0.4670241, (0 missing)
## Surrogate splits:
## age splits as -LLRRR, agree=0.816, adj=0.568, (0 split)
## breast_quad splits as LLRLL, agree=0.609, adj=0.081, (0 split)
## tumor_size splits as ---RL--L---, agree=0.598, adj=0.054, (0 split)
##
## Node number 11: 49 observations, complexity param=0.01351351
## predicted class=3 expected loss=0.6122449 P(node) =0.1768953
## class counts: 15 15 19
## probabilities: 0.306 0.306 0.388
## left son=22 (30 obs) right son=23 (19 obs)
## Primary splits:
## breast_quad splits as RRLLL, improve=1.7055780, (0 missing)
## irradiat splits as LR, improve=1.2179070, (0 missing)
## tumor_size splits as -----LR----, improve=1.0609000, (0 missing)
## age splits as LRRRL-, improve=0.7532395, (0 missing)
## menopause splits as LRR, improve=0.4104658, (0 missing)
## Surrogate splits:
## breast splits as RL, agree=0.653, adj=0.105, (0 split)
##
## Node number 12: 21 observations
## predicted class=2 expected loss=0.1904762 P(node) =0.07581227
## class counts: 0 17 4
## probabilities: 0.000 0.810 0.190
##
## Node number 13: 15 observations
## predicted class=3 expected loss=0.4 P(node) =0.05415162
## class counts: 0 6 9
## probabilities: 0.000 0.400 0.600
##
## Node number 16: 17 observations
## predicted class=1 expected loss=0.4117647 P(node) =0.06137184
## class counts: 10 7 0
## probabilities: 0.588 0.412 0.000
##
## Node number 17: 25 observations
## predicted class=2 expected loss=0.32 P(node) =0.09025271
## class counts: 7 17 1
## probabilities: 0.280 0.680 0.040
##
## Node number 18: 12 observations
## predicted class=1 expected loss=0.4166667 P(node) =0.0433213
## class counts: 7 5 0
## probabilities: 0.583 0.417 0.000
##
## Node number 19: 19 observations
## predicted class=2 expected loss=0.4736842 P(node) =0.06859206
## class counts: 4 10 5
## probabilities: 0.211 0.526 0.263
##
## Node number 20: 50 observations
## predicted class=2 expected loss=0.42 P(node) =0.1805054
## class counts: 14 29 7
## probabilities: 0.280 0.580 0.140
##
## Node number 21: 37 observations, complexity param=0.01351351
## predicted class=3 expected loss=0.5945946 P(node) =0.133574
## class counts: 8 14 15
## probabilities: 0.216 0.378 0.405
## left son=42 (14 obs) right son=43 (23 obs)
## Primary splits:
## breast_quad splits as LLRRR, improve=1.7855190, (0 missing)
## breast splits as RL, improve=0.8710870, (0 missing)
## age splits as --RRLL, improve=0.7952993, (0 missing)
## tumor_size splits as ---RR--L---, improve=0.2003243, (0 missing)
## Surrogate splits:
## age splits as --RRLR, agree=0.649, adj=0.071, (0 split)
##
## Node number 22: 30 observations, complexity param=0.01351351
## predicted class=2 expected loss=0.6 P(node) =0.1083032
## class counts: 8 12 10
## probabilities: 0.267 0.400 0.333
## left son=44 (9 obs) right son=45 (21 obs)
## Primary splits:
## age splits as LLRRL-, improve=1.6322740, (0 missing)
## menopause splits as LRR, improve=0.9080533, (0 missing)
## breast_quad splits as --LRR, improve=0.6437860, (0 missing)
## tumor_size splits as -----LR----, improve=0.6418279, (0 missing)
## breast splits as LR, improve=0.4714349, (0 missing)
##
## Node number 23: 19 observations
## predicted class=3 expected loss=0.5263158 P(node) =0.06859206
## class counts: 7 3 9
## probabilities: 0.368 0.158 0.474
##
## Node number 42: 14 observations
## predicted class=2 expected loss=0.5 P(node) =0.05054152
## class counts: 4 7 3
## probabilities: 0.286 0.500 0.214
##
## Node number 43: 23 observations, complexity param=0.01351351
## predicted class=3 expected loss=0.4782609 P(node) =0.08303249
## class counts: 4 7 12
## probabilities: 0.174 0.304 0.522
## left son=86 (11 obs) right son=87 (12 obs)
## Primary splits:
## breast splits as RL, improve=2.735390, (0 missing)
## tumor_size splits as ---LR--R---, improve=2.650165, (0 missing)
## age splits as --RRLL, improve=1.319145, (0 missing)
## Surrogate splits:
## breast_quad splits as --LRR, agree=0.609, adj=0.182, (0 split)
## age splits as --RRRL, agree=0.565, adj=0.091, (0 split)
## node_caps splits as RL, agree=0.565, adj=0.091, (0 split)
## tumor_size splits as ---RR--L---, agree=0.565, adj=0.091, (0 split)
##
## Node number 44: 9 observations
## predicted class=2 expected loss=0.4444444 P(node) =0.03249097
## class counts: 3 5 1
## probabilities: 0.333 0.556 0.111
##
## Node number 45: 21 observations
## predicted class=3 expected loss=0.5714286 P(node) =0.07581227
## class counts: 5 7 9
## probabilities: 0.238 0.333 0.429
##
## Node number 86: 11 observations
## predicted class=2 expected loss=0.5454545 P(node) =0.03971119
## class counts: 3 5 3
## probabilities: 0.273 0.455 0.273
##
## Node number 87: 12 observations
## predicted class=3 expected loss=0.25 P(node) =0.0433213
## class counts: 1 2 9
## probabilities: 0.083 0.167 0.750
rpart.plot(fit,type=4,extra=2,roundint=FALSE)

Decision tree using custom settings
set.seed(20)
fit <- rpart(deg_malig~age+breast+breast_quad+inv_nodes+irradiat+menopause+node_caps+tumor_size,
method="class", data=breast_cancer,
control=rpart.control(minsplit=4,cp=0.01),
parms=list(split='information'))
summary(fit)
## Call:
## rpart(formula = deg_malig ~ age + breast + breast_quad + inv_nodes +
## irradiat + menopause + node_caps + tumor_size, data = breast_cancer,
## method = "class", parms = list(split = "information"), control = rpart.control(minsplit = 4,
## cp = 0.01))
## n= 277
##
## CP nsplit rel error xerror xstd
## 1 0.02702703 0 1.0000000 1.000000 0.05609499
## 2 0.01351351 4 0.8918919 1.013514 0.05603326
## 3 0.01216216 9 0.8243243 1.074324 0.05560809
## 4 0.01126126 14 0.7635135 1.121622 0.05510791
## 5 0.01013514 18 0.7162162 1.121622 0.05510791
## 6 0.01000000 20 0.6959459 1.121622 0.05510791
##
## Variable importance
## tumor_size inv_nodes breast_quad node_caps age breast
## 27 21 13 11 10 8
## irradiat menopause
## 5 5
##
## Node number 1: 277 observations, complexity param=0.02702703
## predicted class=2 expected loss=0.534296 P(node) =1
## class counts: 66 129 82
## probabilities: 0.238 0.466 0.296
## left son=2 (209 obs) right son=3 (68 obs)
## Primary splits:
## inv_nodes splits as LRRRRRR, improve=20.974280, (0 missing)
## node_caps splits as LR, improve=20.760610, (0 missing)
## tumor_size splits as LLRRRRRRRLR, improve= 9.751465, (0 missing)
## irradiat splits as LR, improve= 9.098196, (0 missing)
## menopause splits as RRL, improve= 2.881789, (0 missing)
## Surrogate splits:
## node_caps splits as LR, agree=0.892, adj=0.559, (0 split)
## irradiat splits as LR, agree=0.769, adj=0.059, (0 split)
##
## Node number 2: 209 observations, complexity param=0.01351351
## predicted class=2 expected loss=0.5358852 P(node) =0.7545126
## class counts: 65 97 47
## probabilities: 0.311 0.464 0.225
## left son=4 (73 obs) right son=5 (136 obs)
## Primary splits:
## tumor_size splits as LLLRRRRRLLL, improve=7.481480, (0 missing)
## node_caps splits as LR, improve=3.733983, (0 missing)
## breast_quad splits as LLRLR, improve=3.080368, (0 missing)
## irradiat splits as LR, improve=3.035000, (0 missing)
## menopause splits as RRL, improve=1.196347, (0 missing)
## Surrogate splits:
## breast_quad splits as LRRRR, agree=0.660, adj=0.027, (0 split)
## menopause splits as RLR, agree=0.656, adj=0.014, (0 split)
##
## Node number 3: 68 observations, complexity param=0.02702703
## predicted class=3 expected loss=0.4852941 P(node) =0.2454874
## class counts: 1 32 35
## probabilities: 0.015 0.471 0.515
## left son=6 (62 obs) right son=7 (6 obs)
## Primary splits:
## tumor_size splits as -RRLLLLLR-L, improve=5.939564, (0 missing)
## inv_nodes splits as -RRRLLL, improve=3.993382, (0 missing)
## menopause splits as R-L, improve=2.885781, (0 missing)
## breast splits as RL, improve=2.874078, (0 missing)
## breast_quad splits as LRLRL, improve=2.874078, (0 missing)
##
## Node number 4: 73 observations, complexity param=0.01126126
## predicted class=2 expected loss=0.4657534 P(node) =0.2635379
## class counts: 28 39 6
## probabilities: 0.384 0.534 0.082
## left son=8 (42 obs) right son=9 (31 obs)
## Primary splits:
## breast_quad splits as RLRLL, improve=2.319334, (0 missing)
## tumor_size splits as RLR-----LLR, improve=2.233882, (0 missing)
## node_caps splits as LR, improve=1.921021, (0 missing)
## irradiat splits as LR, improve=1.246302, (0 missing)
## age splits as -LRLLL, improve=1.116546, (0 missing)
## Surrogate splits:
## breast splits as LR, agree=0.630, adj=0.129, (0 split)
## node_caps splits as LR, agree=0.616, adj=0.097, (0 split)
## tumor_size splits as RLL-----LLL, agree=0.603, adj=0.065, (0 split)
## age splits as -LLLRL, agree=0.589, adj=0.032, (0 split)
## irradiat splits as LR, agree=0.589, adj=0.032, (0 split)
##
## Node number 5: 136 observations, complexity param=0.01351351
## predicted class=2 expected loss=0.5735294 P(node) =0.4909747
## class counts: 37 58 41
## probabilities: 0.272 0.426 0.301
## left son=10 (87 obs) right son=11 (49 obs)
## Primary splits:
## tumor_size splits as ---LLRRL---, improve=2.445071, (0 missing)
## irradiat splits as LR, improve=2.434000, (0 missing)
## node_caps splits as LR, improve=2.052153, (0 missing)
## age splits as RRRRRL, improve=1.927031, (0 missing)
## menopause splits as RRL, improve=1.535865, (0 missing)
## Surrogate splits:
## menopause splits as LRL, agree=0.654, adj=0.041, (0 split)
## node_caps splits as LR, agree=0.654, adj=0.041, (0 split)
## age splits as RLLLLL, agree=0.647, adj=0.020, (0 split)
## breast_quad splits as LLLLR, agree=0.647, adj=0.020, (0 split)
##
## Node number 6: 62 observations, complexity param=0.02702703
## predicted class=2 expected loss=0.483871 P(node) =0.2238267
## class counts: 0 32 30
## probabilities: 0.000 0.516 0.484
## left son=12 (15 obs) right son=13 (47 obs)
## Primary splits:
## tumor_size splits as ---LRRRR--L, improve=3.382129, (0 missing)
## inv_nodes splits as -RRRLLL, improve=3.093532, (0 missing)
## menopause splits as R-L, improve=2.619234, (0 missing)
## breast_quad splits as LRLRL, improve=2.090369, (0 missing)
## breast splits as RL, improve=1.582488, (0 missing)
## Surrogate splits:
## inv_nodes splits as -RRLRRR, agree=0.774, adj=0.067, (0 split)
##
## Node number 7: 6 observations
## predicted class=3 expected loss=0.1666667 P(node) =0.02166065
## class counts: 1 0 5
## probabilities: 0.167 0.000 0.833
##
## Node number 8: 42 observations, complexity param=0.01126126
## predicted class=2 expected loss=0.4285714 P(node) =0.1516245
## class counts: 17 24 1
## probabilities: 0.405 0.571 0.024
## left son=16 (17 obs) right son=17 (25 obs)
## Primary splits:
## age splits as -LRRLL, improve=2.3409030, (0 missing)
## tumor_size splits as LLR-----LRR, improve=1.6696220, (0 missing)
## menopause splits as LLR, improve=0.7583689, (0 missing)
## breast_quad splits as -R-LL, improve=0.5940572, (0 missing)
## breast splits as LR, improve=0.5723340, (0 missing)
## Surrogate splits:
## menopause splits as LRR, agree=0.643, adj=0.118, (0 split)
## breast_quad splits as -R-LR, agree=0.619, adj=0.059, (0 split)
##
## Node number 9: 31 observations, complexity param=0.01126126
## predicted class=2 expected loss=0.516129 P(node) =0.1119134
## class counts: 11 15 5
## probabilities: 0.355 0.484 0.161
## left son=18 (12 obs) right son=19 (19 obs)
## Primary splits:
## tumor_size splits as RLR------LR, improve=3.932371, (0 missing)
## irradiat splits as LR, improve=3.181426, (0 missing)
## age splits as -RRLRR, improve=2.397819, (0 missing)
## menopause splits as LRL, improve=1.915670, (0 missing)
## node_caps splits as LR, improve=1.463911, (0 missing)
## Surrogate splits:
## age splits as -RLRRL, agree=0.677, adj=0.167, (0 split)
## breast splits as LR, agree=0.645, adj=0.083, (0 split)
##
## Node number 10: 87 observations, complexity param=0.01216216
## predicted class=2 expected loss=0.5057471 P(node) =0.3140794
## class counts: 22 43 22
## probabilities: 0.253 0.494 0.253
## left son=20 (50 obs) right son=21 (37 obs)
## Primary splits:
## menopause splits as R-L, improve=4.014261, (0 missing)
## breast_quad splits as LLRLR, improve=2.556689, (0 missing)
## age splits as -RRRRL, improve=2.279601, (0 missing)
## irradiat splits as LR, improve=2.196026, (0 missing)
## node_caps splits as RL, improve=1.433499, (0 missing)
## Surrogate splits:
## age splits as -LLRRR, agree=0.816, adj=0.568, (0 split)
## breast_quad splits as LLRLL, agree=0.609, adj=0.081, (0 split)
## tumor_size splits as ---RL--L---, agree=0.598, adj=0.054, (0 split)
##
## Node number 11: 49 observations, complexity param=0.01351351
## predicted class=3 expected loss=0.6122449 P(node) =0.1768953
## class counts: 15 15 19
## probabilities: 0.306 0.306 0.388
## left son=22 (2 obs) right son=23 (47 obs)
## Primary splits:
## breast_quad splits as RRRLR, improve=2.465846, (0 missing)
## node_caps splits as LR, improve=1.893171, (0 missing)
## irradiat splits as LR, improve=1.217907, (0 missing)
## age splits as LRRRR-, improve=1.207596, (0 missing)
## tumor_size splits as -----LR----, improve=1.060900, (0 missing)
##
## Node number 12: 15 observations
## predicted class=2 expected loss=0.2 P(node) =0.05415162
## class counts: 0 12 3
## probabilities: 0.000 0.800 0.200
##
## Node number 13: 47 observations, complexity param=0.02702703
## predicted class=3 expected loss=0.4255319 P(node) =0.1696751
## class counts: 0 20 27
## probabilities: 0.000 0.426 0.574
## left son=26 (24 obs) right son=27 (23 obs)
## Primary splits:
## breast_quad splits as LRLRL, improve=2.5528750, (0 missing)
## inv_nodes splits as -RR-LLL, improve=1.5080160, (0 missing)
## breast splits as RL, improve=1.2247570, (0 missing)
## age splits as -RLRL-, improve=0.7515622, (0 missing)
## tumor_size splits as ----RLRR---, improve=0.7515622, (0 missing)
## Surrogate splits:
## breast splits as RL, agree=0.872, adj=0.739, (0 split)
## age splits as -LLRL-, agree=0.681, adj=0.348, (0 split)
## menopause splits as R-L, agree=0.660, adj=0.304, (0 split)
## node_caps splits as LR, agree=0.596, adj=0.174, (0 split)
## inv_nodes splits as -LL-LRL, agree=0.574, adj=0.130, (0 split)
##
## Node number 16: 17 observations, complexity param=0.01126126
## predicted class=1 expected loss=0.4117647 P(node) =0.06137184
## class counts: 10 7 0
## probabilities: 0.588 0.412 0.000
## left son=32 (15 obs) right son=33 (2 obs)
## Primary splits:
## tumor_size splits as LLL-----LRR, improve=1.9696920, (0 missing)
## breast_quad splits as -R-RL, improve=1.1535550, (0 missing)
## breast splits as RL, improve=0.6976266, (0 missing)
## age splits as -R--RL, improve=0.5523776, (0 missing)
## irradiat splits as RL, improve=0.5523776, (0 missing)
##
## Node number 17: 25 observations
## predicted class=2 expected loss=0.32 P(node) =0.09025271
## class counts: 7 17 1
## probabilities: 0.280 0.680 0.040
##
## Node number 18: 12 observations
## predicted class=1 expected loss=0.4166667 P(node) =0.0433213
## class counts: 7 5 0
## probabilities: 0.583 0.417 0.000
##
## Node number 19: 19 observations
## predicted class=2 expected loss=0.4736842 P(node) =0.06859206
## class counts: 4 10 5
## probabilities: 0.211 0.526 0.263
##
## Node number 20: 50 observations, complexity param=0.01013514
## predicted class=2 expected loss=0.42 P(node) =0.1805054
## class counts: 14 29 7
## probabilities: 0.280 0.580 0.140
## left son=40 (42 obs) right son=41 (8 obs)
## Primary splits:
## irradiat splits as LR, improve=3.9554440, (0 missing)
## breast_quad splits as RRRLR, improve=1.4269000, (0 missing)
## tumor_size splits as ---RR--L---, improve=1.3395510, (0 missing)
## node_caps splits as LR, improve=0.5521029, (0 missing)
## age splits as -RLL--, improve=0.3090612, (0 missing)
##
## Node number 21: 37 observations, complexity param=0.01216216
## predicted class=3 expected loss=0.5945946 P(node) =0.133574
## class counts: 8 14 15
## probabilities: 0.216 0.378 0.405
## left son=42 (32 obs) right son=43 (5 obs)
## Primary splits:
## breast_quad splits as LLLRR, improve=2.6485070, (0 missing)
## age splits as --RRRL, improve=2.2392370, (0 missing)
## node_caps splits as RL, improve=0.9948200, (0 missing)
## irradiat splits as LR, improve=0.9233306, (0 missing)
## breast splits as RL, improve=0.8710870, (0 missing)
## Surrogate splits:
## irradiat splits as LR, agree=0.892, adj=0.2, (0 split)
##
## Node number 22: 2 observations
## predicted class=2 expected loss=0 P(node) =0.007220217
## class counts: 0 2 0
## probabilities: 0.000 1.000 0.000
##
## Node number 23: 47 observations
## predicted class=3 expected loss=0.5957447 P(node) =0.1696751
## class counts: 15 13 19
## probabilities: 0.319 0.277 0.404
##
## Node number 26: 24 observations, complexity param=0.01351351
## predicted class=2 expected loss=0.4166667 P(node) =0.0866426
## class counts: 0 14 10
## probabilities: 0.000 0.583 0.417
## left son=52 (4 obs) right son=53 (20 obs)
## Primary splits:
## age splits as -RRRL-, improve=2.4376950, (0 missing)
## inv_nodes splits as -RR-RLL, improve=1.1694330, (0 missing)
## breast_quad splits as L-R-L, improve=0.7116023, (0 missing)
## irradiat splits as RL, improve=0.3447022, (0 missing)
## breast splits as LR, improve=0.2885215, (0 missing)
## Surrogate splits:
## breast_quad splits as L-R-R, agree=0.875, adj=0.25, (0 split)
##
## Node number 27: 23 observations
## predicted class=3 expected loss=0.2608696 P(node) =0.08303249
## class counts: 0 6 17
## probabilities: 0.000 0.261 0.739
##
## Node number 32: 15 observations
## predicted class=1 expected loss=0.3333333 P(node) =0.05415162
## class counts: 10 5 0
## probabilities: 0.667 0.333 0.000
##
## Node number 33: 2 observations
## predicted class=2 expected loss=0 P(node) =0.007220217
## class counts: 0 2 0
## probabilities: 0.000 1.000 0.000
##
## Node number 40: 42 observations
## predicted class=2 expected loss=0.3809524 P(node) =0.1516245
## class counts: 13 26 3
## probabilities: 0.310 0.619 0.071
##
## Node number 41: 8 observations, complexity param=0.01013514
## predicted class=3 expected loss=0.5 P(node) =0.02888087
## class counts: 1 3 4
## probabilities: 0.125 0.375 0.500
## left son=82 (4 obs) right son=83 (4 obs)
## Primary splits:
## breast splits as LR, improve=3.2958370, (0 missing)
## tumor_size splits as ---RL--L---, improve=1.7260920, (0 missing)
## age splits as -LLR--, improve=0.7648207, (0 missing)
## breast_quad splits as -LR--, improve=0.6103747, (0 missing)
## Surrogate splits:
## age splits as -LRR--, agree=0.750, adj=0.50, (0 split)
## breast_quad splits as -RL--, agree=0.625, adj=0.25, (0 split)
## tumor_size splits as ---RR--L---, agree=0.625, adj=0.25, (0 split)
##
## Node number 42: 32 observations, complexity param=0.01216216
## predicted class=2 expected loss=0.5625 P(node) =0.1155235
## class counts: 6 14 12
## probabilities: 0.188 0.438 0.375
## left son=84 (14 obs) right son=85 (18 obs)
## Primary splits:
## breast_quad splits as LLR--, improve=1.6588870, (0 missing)
## age splits as --RRRL, improve=1.3359340, (0 missing)
## node_caps splits as RL, improve=0.8474846, (0 missing)
## tumor_size splits as ---LR--L---, improve=0.4361799, (0 missing)
## breast splits as RL, improve=0.3107940, (0 missing)
## Surrogate splits:
## tumor_size splits as ---RL--R---, agree=0.656, adj=0.214, (0 split)
## age splits as --RRLR, agree=0.625, adj=0.143, (0 split)
##
## Node number 43: 5 observations
## predicted class=3 expected loss=0.4 P(node) =0.01805054
## class counts: 2 0 3
## probabilities: 0.400 0.000 0.600
##
## Node number 52: 4 observations
## predicted class=2 expected loss=0 P(node) =0.01444043
## class counts: 0 4 0
## probabilities: 0.000 1.000 0.000
##
## Node number 53: 20 observations, complexity param=0.01351351
## predicted class=2 expected loss=0.5 P(node) =0.07220217
## class counts: 0 10 10
## probabilities: 0.000 0.500 0.500
## left son=106 (8 obs) right son=107 (12 obs)
## Primary splits:
## inv_nodes splits as -RR-RLL, improve=1.7260920, (0 missing)
## age splits as -LLR--, improve=1.2657560, (0 missing)
## menopause splits as R-L, improve=0.6485757, (0 missing)
## tumor_size splits as ----RLLR---, improve=0.4201185, (0 missing)
## irradiat splits as RL, improve=0.4027103, (0 missing)
## Surrogate splits:
## age splits as -LRR--, agree=0.65, adj=0.125, (0 split)
## tumor_size splits as ----RRLR---, agree=0.65, adj=0.125, (0 split)
##
## Node number 82: 4 observations
## predicted class=2 expected loss=0.25 P(node) =0.01444043
## class counts: 0 3 1
## probabilities: 0.000 0.750 0.250
##
## Node number 83: 4 observations
## predicted class=3 expected loss=0.25 P(node) =0.01444043
## class counts: 1 0 3
## probabilities: 0.250 0.000 0.750
##
## Node number 84: 14 observations, complexity param=0.01216216
## predicted class=2 expected loss=0.5 P(node) =0.05054152
## class counts: 4 7 3
## probabilities: 0.286 0.500 0.214
## left son=168 (6 obs) right son=169 (8 obs)
## Primary splits:
## tumor_size splits as ---LR--R---, improve=2.5310160, (0 missing)
## age splits as --RLR-, improve=1.5716460, (0 missing)
## breast_quad splits as RL---, improve=0.7316467, (0 missing)
## breast splits as LR, improve=0.6214736, (0 missing)
## Surrogate splits:
## breast_quad splits as LR---, agree=0.643, adj=0.167, (0 split)
##
## Node number 85: 18 observations, complexity param=0.01216216
## predicted class=3 expected loss=0.5 P(node) =0.06498195
## class counts: 2 7 9
## probabilities: 0.111 0.389 0.500
## left son=170 (10 obs) right son=171 (8 obs)
## Primary splits:
## breast splits as RL, improve=2.4487940, (0 missing)
## age splits as --RRLL, improve=2.1119580, (0 missing)
## tumor_size splits as ---RR--L---, improve=1.9564520, (0 missing)
## node_caps splits as RL, improve=0.9912506, (0 missing)
##
## Node number 106: 8 observations
## predicted class=2 expected loss=0.25 P(node) =0.02888087
## class counts: 0 6 2
## probabilities: 0.000 0.750 0.250
##
## Node number 107: 12 observations
## predicted class=3 expected loss=0.3333333 P(node) =0.0433213
## class counts: 0 4 8
## probabilities: 0.000 0.333 0.667
##
## Node number 168: 6 observations
## predicted class=1 expected loss=0.5 P(node) =0.02166065
## class counts: 3 1 2
## probabilities: 0.500 0.167 0.333
##
## Node number 169: 8 observations
## predicted class=2 expected loss=0.25 P(node) =0.02888087
## class counts: 1 6 1
## probabilities: 0.125 0.750 0.125
##
## Node number 170: 10 observations
## predicted class=2 expected loss=0.5 P(node) =0.03610108
## class counts: 2 5 3
## probabilities: 0.200 0.500 0.300
##
## Node number 171: 8 observations
## predicted class=3 expected loss=0.25 P(node) =0.02888087
## class counts: 0 2 6
## probabilities: 0.000 0.250 0.750
rpart.plot(fit,type=4,extra=2,roundint=FALSE)
